'''
* This is the projet for Brtc LlmOps Platform
* @Author Leon-liao <liaosiliang@alltman.com>
* @Description //TODO 
* @File: 4_study_url_loader.py
* @Time: 2025/8/20
* @All Rights Reserve By Brtc
'''
from langchain_community.document_loaders import UnstructuredExcelLoader, UnstructuredPowerPointLoader, \
    UnstructuredWordDocumentLoader, WebBaseLoader

url_loader = WebBaseLoader("https://www.baidu.com")
docs = url_loader.load()

print(docs)
print(len(docs))
print(docs[0].metadata)